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* C-C increased from 12 to 15 

* Z is average of EQ 
*B is average of ND 

* match with stop is _M; stop-stop = 0; J (joker) match = 0 



Mefine M 



/* value of a match with a stop */ 



f*A*J 
f*B*/ 
/*C*/ 
/*D*/ 

/*£*/ 

/*F*/ 
/*G*/ 
/*H*/ 
1*1*1 

/*K*/ 
/*!.*/ 
/*M*/ 
/*N*/ 

/*o*/ 

/*P*/ 
/*Q*/ 
/*R*/ 
/*S*/ 
/*T*/ 
/*U*/ 
/*V*/ 
/* W*/ 
J*X*f 
j*Y*f 
l*Z*l 

}; 



_day[26][26] = { 

.BCDEFGHIJKLMNOPQRSTUVWXYZ*/ 
{ 2, 0,-2, 0. 0,-4, 1,-1,-1, 0,-1,-2.-1, 0,_M, 1, 0,-2, 1, 1, 0, 0,-6, 0,-3, 0}, 
{ 0, 3,-4, 3, 2,-5, 0, 1,-2, 0, 0,-3,-2, 2, M,-l, 1, 0, 0, 0, 0,-2,-5, 0,-3, 1>, 
{-2,-4,15,-5,-5.-4,-3,-3,-2, 0,-5,-6,-5,-4T_M,-3,-5,^, 0,-2, 0,-2,-8, 0, 0,-5}, 
{ 0, 3,-5, 4, 3,-6, 1, 1,-2, 0, 0,-4,-3, 2,_M,-1, 2,-1, 0, 0, 0,-2,-7, 0,-4, 2}, 
{ 0, 2,-5, 3, 4,-5, 0, 1,-2, 0, 0,-3,-2, 1,_M,-1, 2,-1, 0, 0, 0,-2,-7, 0,-4, 3}, 
{-4,-5,-4,-6,-5, 9,-5,-2, 1. 0,-5, 2, 0,-4,_M,-5,-5,-4.-3,-3, 0,-1, 0, 0, 7,-5}, 
{ 1, 0,-3, 1, 0,-5, 5,-2,-3, 0,-2,^,-3, 0,_M,-l,-l,-3, 1, 0, 0,-1,-7, 0,-5, 0}, 
{-1, 1,-3, 1, 1,-2,-2, 6,-2, 0, 0,-2,-2, 2,_M. 0, 3, 2,-1,-1, 0,-2,-3, 0, 0, 2}, 
{-1,-2,-2,-2,-2, 1,-3,-2, 5, 0,-2, 2, 2,-2,_M.-2,-2,-2,-l, 0, 0, 4,-5, 0,-1,-2}, 
{ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,_M, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, 
{-1. 0,-5, 0, 0,-5,-2, 0,-2, 0, 5,-3, 0, 1,_M,-1, 1, 3. 0, 0, 0,-2,-3, 0,-4, 0}, 
{-2,-3,-6,-4,-3, 2,-4,-2, 2, 0,-3, 6, 4,-3,_M,-3,-2,-3,-3,-l, 0, 2,-2, 0,-1,-2}, 
{-1,-2,-5,-3,-2, 0,-3,-2, 2, 0, 0, 4, 6,-2,_M,-2,-l, 0,-2,-1, 0, 2,-4, 0,-2,-1}, 
{ 0, 2,-4, 2, 1,-4, 0, 2,-2, 0, 1,-3,-2, 2,_M,-1, 1, 0, 1, 0, 0,-2,-t, 0,-2, 1}, 

{_M,_M,_M,_M,_M,_M,_M,_M,_M,_M,_M,_M,_M,_M, 0,_M,_M,_M,_M,_M,_M, M,_M, M, M, M}, 

{ 1,-1,-3,-1,-1,-5,-1, 0,-2, 0,-l,-3,-2,-l,_M, 6, 0, 0, 1, 0, 0,-1,-6, 0,-5, 0}, 

{ 0, 1,-5, 2, 2,-5,-1, 3,-2, 0, 1,-2,-1, 1,_M, 0, 4, 1,-1,-1, 0,-2,-5. 0,-4, 3}, 

{-2, 0,-4,-1,-1,-4,-3, 2,-2, 0, 3,-3, 0, 0,_M, 0, 1, 6, 0,-1, 0,-2, 2, 0,-4, 0}, 

{ 1, 0, 0, 0, 0,-3, 1,-1,-1, 0, 0,-3,-2, 1,_M, 1,-1, 0, 2, 1, 0,-1,-2, 0,-3, 0}, 

{ 1, 0,-2, 0, 0,-3, 0,-1, 0, 0, 0,-1,-1, 0,_M, 0,-1,-1, 1, 3, 0, 0,-5, 0,-3, 0}, 

{ 0, 0, 0. 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,_M, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, 

{ 0,-2,-2,-2,-2,-1,-1,-2, 4, 0,-2, 2, 2,-2,_M,-l ,-2,-2,-1, 0, 0, 4,-6, 0,-2,-2}, 

{-6,-5,-8,-7,-7, 0,-7,-3,-5, 0,-3,-2,-4,-4,_M.-6,-5, 2,-2,-5, 0,-6,17, 0, 0,-6}, 

{ 0, 0, 0, 0, 0, 0, 0, 0. 0, 0, 0, 0, 0, 0,_M, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0}, 

{-3,-3, 0,-4,-4, 7,-5, 0,-1, 0,-4,-l,-2,-2,_M,-5,-4,-4,-3,-3, 0,-2, 0, 0,10,-4}, 

{ 0, 1,-5, 2, 3,-5, 0, 2,-2, 0, 0,-2.-1, 1,_M, 0, 3, 0, 0, 0, 0,-2,-6, 0,-4, 4} 
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Table 1 (conV) 
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include 
jS^cIude 



<stdio.h> 
<ctype.h> 



#define 


MAXJMP 


16 


Mefine 


MAXGAP 


24 


#de6ne 


JMPS 


1024 


Mefine 


MX 


4 


^define 


DMAT 


3 


Mefine 


DMIS 


0 




DINSO 


8 


jS'define 


DINSl 


1 


^define 


PINSO 


8 


Mefine 


pmsi 


4 



/* max jumps in a diag */ 

/* don't continue to penaUze gaps larger than this */ 
/* max jmps in an path */ 

/* save if there's at least MX-1 bases since last jmp */ 

/* value of matching bases */ 

/* penalty for mismatched bases */ 

/* penalty for a gap */ 

/* penalty per base */ 

/* penalty for a gap */ 

/* penalty per residue */ 



struct jmp { 

short 

unsigned short 

}; 

struct di:^ { 
int 
long 
short 
struct jmp 



nIMAXJMP]; 
xlMAXJMP]; 



ijmp; 



/* size of jmp (neg for dely) */ 
/* base no. of jmp in seq x */ 
/* limits seq to 2^16 -1 */ 



/* score at I^t jmp */ 
/* offset of prev block */ 
/* current jmp index */ 
/* list of jmps */ 



:tpath{ 





int 


spc; 


/* number of leading spaces */ 




short 


n[JMPS]: 


/* size of jmp (gap) */ 


}: 


int 


x[JMPS]; 


/* loc of jmp (last elem before gap) */ 






*ofile; 


/* ou^ut file name */ 


char 




*namex[2]; 


/* seq names: getseqsQ */ 


char 




*prog; 


/* prog name for err msgs */ 






*seqx[2]; 


/* seqs: getseqsQ */ 


int 




dmax; 


/* best diag: nwO */ 


int 




dmaxD; 


/* final diag */ 


int 




dna; 


/* set if dna: mainQ */ 


int 




endgaps; 


/* set if penalizing end gaps */ 


int 




gapx, gapy; 


/* total gaps in seqs */ 


int 




lenO, lenl; 


/* seq lens */ 


int 




ngapx, ngapy; /* total size of gaps */ 


int 




smax; 


/* max score: nwQ */ 


int 




*xbm; 


/* bitmap for matching */ 


long 




ofifeet; 


/* current offset in jmp file */ 


struct 


diag 


*dx; 


/* holds diagonals */ 


struct 


path 


PP[2]; 


/* holds path for seqs */ 


char 




*callocO, *malloc0, *indexO, *strcpyO; 






*getseqO, *g 


_caliocO; 
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Table 1 fcont'> 

/* Needleman-Wunsch alignment program 

* usage: progs fflel file2 

* where filel and file2 are two dna or two protein sequences. 

* The sequences can be in upper- or lower-case an may contain ambiguity 

* Any lines beginning with ';','>' or '<* are ignored 

* Max file length is 65535 (limited by imsigned short x in the jmp struct) 

* A sequence with 1/3 or more of its elements ACGTU is assumed to be DNA 

* Output is in the file "align.out" 

* The program may create a tmp file in /tmp to hold info about traceback. 

* Original version developed under BSD 4.3 on a vax 8650 
*/ 

jj^aclude "nw.h" 
delude "day.h" 

static _dbval[25| = { 

1,14,2,13,0,0,4.11,0,0,12,0,3,15,0,0,0,5,6,8,8,7,9,0,10.0 



_pbval[26] = { 

1, 2 1 (1< < ('D'-'A')) [ (1< < ('N'-'A')), 4, 8, 16, 32, 64. 
128, 256, OxFFFFFFF, 1<<10. 1<<11, 1<<12, 1<<13, 1<<14, 
1<<15, 1<<16, 1<<17, 1<<18, 1<<19, 1<<20, 1<<21, 1< <22, 
1<<23, 1<<24. 1<<25[(1<<CE'-'A'))I(1<<CQ'-'A')) 



30 char *avD; 

{ 

prog = av[0]; 
if(ac!=3){ 

f^rintf(stderr. "usage: %s filel fae2\n", prog); 
35 ^rintf(stderr. "wiiere filel and file2 are two dna or two protein sequences-Vn"); 

^rintf(stderr,"The sequences can be in upper- or lower-case\n"); 

§)rintf(stderr,"Any lines beginning with ';' or ' < ' are ignored\n"); 

fi)rintf(stderr, "Output is in the fde \"align.out\''\n"); 

exit(l); 

40 } 

namex[01 = av[l]; 
namex[l] = av[2]; 
seqx[0] = getseq(namex[0], &len0); 
seqx[ll = getseq(namexEl], &lenl); 
45 xbm = (dna)? jdbval : _pbval; 



55 } 



= 0; /* 1 to penalize endgaps */ 

ofile = "align.out"; /* ouq)ut file */ 

nwQ; /* fill in the matrix, get the possible jmps */ 

readjmpsO; /* get the actual jmps */ 

printO; /* print stats, alignment */ 

cleanup(0); /* unlink any tmp files */ 
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